@article{MapReduce,
author = {Dean, Jeffrey and Ghemawat, Sanjay},
file = {:Users/Josh/Library/Application Support/Mendeley Desktop/Downloaded/Dean, Ghemawat - 2008 - MapReduce Simplified data processing on large clusters.pdf:pdf},
journal = {Communications of the ACM},
number = {1},
pages = {107--113},
publisher = {ACM},
title = {{MapReduce: Simplified data processing on large clusters}},
url = {http://portal.acm.org/citation.cfm?id=1327492},
volume = {51},
year = {2008}
}
@article{MPI,
author = {Hoefler, Torsten and Lumsdaine, Andrew and Dongarra, Jack},
file = {:Users/Josh/Documents/CMPUT 681/Project/Papers/fulltext2.pdf:pdf},
journal = {Recent Advances in Parallel Virtual Machine and Message Passing Interface},
pages = {240--249},
publisher = {Springer},
title = {{Towards efficient mapreduce using mpi}},
url = {http://www.springerlink.com/index/911500586j046m4n.pdf},
year = {2009}
}
@article{HPCVM,
address = {New York, New York, USA},
author = {Huang, Wei and Liu, Jiuxing and Abali, Bulent and Panda, Dhabaleswar K.},
doi = {10.1145/1183401.1183421},
file = {:Users/Josh/Documents/CMPUT 681/Project/Papers/10.1.1.81.7050.pdf:pdf},
isbn = {1595932828},
journal = {Proceedings of the 20th annual international conference on Supercomputing - ICS '06},
pages = {125},
publisher = {ACM Press},
title = {{A case for high performance computing with virtual machines}},
url = {http://portal.acm.org/citation.cfm?doid=1183401.1183421},
year = {2006}
}
@inproceedings{Cloudlet,
author = {Ibrahim, Shadi and Jin, Hai and Cheng, Bin and Cao, Haijun and Wu, Song and Qi, L.},
booktitle = {Proceedings of the 18th ACM international symposium on High performance distributed computing},
file = {:Users/Josh/Documents/CMPUT 681/Project/Papers/p65-ibrahim.pdf:pdf},
isbn = {9781605585871},
pages = {65--66},
publisher = {ACM},
title = {{CLOUDLET: towards mapreduce implementation on virtual machines}},
url = {http://dl.acm.org/citation.cfm?id=1551624},
year = {2009}
}
@article{MRVM,
author = {Ibrahim, Shadi and Jin, Hai and Lu, Lu and Qi, Li and Wu, Song and Shi, Xuanhua},
file = {:Users/Josh/Documents/CMPUT 681/Project/Papers/fulltext.pdf:pdf},
journal = {Cloud Computing},
keywords = {cloud computing,data intensive,distrib-,hadoop,mapreduce,uted file system,virtual machine},
number = {2007},
pages = {519--528},
publisher = {Springer},
title = {{Evaluating mapreduce on virtual machines: The hadoop case}},
url = {http://www.springerlink.com/index/b658142m12217300.pdf},
year = {2009}
}
@article{Hadoop,
author = {Jiang, Dawei and Ooi, B.C. and Shi, L. and Wu, S.},
file = {:Users/Josh/Documents/CMPUT 681/Project/Papers/p472-jiang.pdf:pdf},
journal = {Proceedings of the VLDB Endowment},
number = {1-2},
pages = {472--483},
publisher = {VLDB Endowment},
title = {{The performance of mapreduce: An in-depth study}},
url = {http://dl.acm.org/citation.cfm?id=1920903},
volume = {3},
year = {2010}
}
@article{Book,
author = {Lin, Jimmy and Dyer, Chris},
file = {:Users/Josh/Library/Application Support/Mendeley Desktop/Downloaded/Lin, Dyer - 2010 - Data-Intensive Text Processing with MapReduce.pdf:pdf},
isbn = {9781608453429},
journal = {Synthesis Lectures on Human Language Technologies},
number = {1},
pages = {1--177},
publisher = {Morgan \& Claypool Publishers},
title = {{Data-intensive text processing with MapReduce}},
url = {http://www.morganclaypool.com/doi/abs/10.2200/S00274ED1V01Y201006HLT007},
volume = {3},
year = {2010}
}

@article{InvInd,
author = {Melink, S. and Raghavan, Sriram and Yang, Beverly and Garcia-Molina, Hector},
doi = {10.1145/502115.502116},
file = {:Users/Josh/Downloads/p217-melnik.pdf:pdf},
issn = {10468188},
journal = {ACM Transactions on Information Systems (TOIS)},
month = jul,
number = {3},
pages = {217--241},
publisher = {ACM},
title = {{Building a distributed full-text index for the web}},
url = {http://portal.acm.org/citation.cfm?doid=502115.502116 http://dl.acm.org/citation.cfm?id=502116},
volume = {19},
year = {2001}
}
@book{grama2003introduction,
  title={Introduction to parallel computing},
  author={Grama, A.},
  year={2003},
  publisher={Addison Wesley Longman}
}

@inproceedings{jedlitschka2005reporting,
  title={Reporting guidelines for controlled experiments in software engineering},
  author={Jedlitschka, A. and Pfahl, D.},
  booktitle={Empirical Software Engineering, 2005. 2005 International Symposium on},
  pages={10--pp},
  year={2005},
  organization={IEEE}
}

@book{goldberg1991matrix,
  title={Matrix theory with applications},
  author={Goldberg, J.L.},
  year={1991},
  publisher={McGraw-Hill College}
}

@book{white2010hadoop,
  title={Hadoop: The definitive guide},
  author={White, T.},
  year={2010},
  publisher={Yahoo Press}
}

@misc{hadooptutorial2011,
	title={Running Hadoop On Ubuntu Linux (Multi-Node Cluster)},
	author={Michael G. Noll},
	year={2011},
	howpublished={\url{http://www.michael-noll.com/tutorials/running-hadoop-on-ubuntu-linux-multi-node-cluster/}}
}

@misc{clueweb,
	title={The ClueWeb09 Dataset},
	author={The Lemur Project, University of Massachusetts and Carnegie Mellon University},
	year={2009},
	howpublished={\url{http://lemurproject.org/about.php}}
}

@misc{wikidumps,
	title={Wikimedia Wiki Dumps},
	author={Wikimedia},
	year={2011},
	howpublished={\url{http://dumps.wikimedia.org/}}
}

@inproceedings{WebStats,
  title={The Portrait of a Common HTML Web Page},
  author={Levering, R. and M. Cutler},
  booktitle={DocEng 2006},
  pages={198-204},
  year={2006},
  organization={ACM}
}

@misc{WikiStats,
	title={Wikipedia:Words per article},
	author={Wikipedia},
	year={2008},
	howpublished={\url{http://en.wikipedia.org/wiki/Wikipedia:Words_per_article}}
}

